{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Note\n",
    "* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Dependencies and Setup\n",
    "import pandas as pd\n",
    "\n",
    "# File to Load (Remember to Change These)\n",
    "file_to_load = \"Resources/data_csv.csv\"\n",
    "\n",
    "# Read Purchasing File and store into Pandas data frame\n",
    "purchase_data = pd.read_csv(file_to_load)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Name</th>\n",
       "      <th>Age</th>\n",
       "      <th>AgeGroup</th>\n",
       "      <th>Item ID</th>\n",
       "      <th>Item Name</th>\n",
       "      <th>Item Price</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>Junayd Pemberton</td>\n",
       "      <td>42</td>\n",
       "      <td>Adult</td>\n",
       "      <td>108</td>\n",
       "      <td>button</td>\n",
       "      <td>8.51</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>Phebe Maguire</td>\n",
       "      <td>40</td>\n",
       "      <td>Adult</td>\n",
       "      <td>143</td>\n",
       "      <td>eraser</td>\n",
       "      <td>11.03</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>Sara Shaffer</td>\n",
       "      <td>40</td>\n",
       "      <td>Adult</td>\n",
       "      <td>92</td>\n",
       "      <td>knife</td>\n",
       "      <td>0.20</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>Cathy George</td>\n",
       "      <td>31</td>\n",
       "      <td>Adult</td>\n",
       "      <td>100</td>\n",
       "      <td>wallet</td>\n",
       "      <td>10.95</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>Haiden Schmidt</td>\n",
       "      <td>45</td>\n",
       "      <td>Adult</td>\n",
       "      <td>131</td>\n",
       "      <td>vase</td>\n",
       "      <td>4.85</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "               Name  Age AgeGroup  Item ID Item Name  Item Price\n",
       "0  Junayd Pemberton   42    Adult      108    button        8.51\n",
       "1     Phebe Maguire   40    Adult      143    eraser       11.03\n",
       "2      Sara Shaffer   40    Adult       92     knife        0.20\n",
       "3      Cathy George   31    Adult      100    wallet       10.95\n",
       "4    Haiden Schmidt   45    Adult      131      vase        4.85"
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "purchase_data.head()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Customer Count"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* Display the total number of customers\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Total Customers</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>576</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   Total Customers\n",
       "0              576"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Calculate the number of customers\n",
    "\n",
    "\n",
    "# create a dataframe\n",
    "\n",
    "\n",
    "# show the dataframe\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Purchase Analysis (Total)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* Run basic calculations to obtain number of unique items, average price, etc.\n",
    "\n",
    "\n",
    "* Create a summary data frame to hold the results\n",
    "\n",
    "\n",
    "* Optional: give the displayed data cleaner formatting\n",
    "\n",
    "\n",
    "* Display the summary data frame\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th># of Unique Items</th>\n",
       "      <th>Avg Item Price</th>\n",
       "      <th>Number of Item Purchases</th>\n",
       "      <th>Total of All Purchases</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>179</td>\n",
       "      <td>$5.54</td>\n",
       "      <td>780</td>\n",
       "      <td>$4,317.30</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   # of Unique Items Avg Item Price  Number of Item Purchases  \\\n",
       "0                179          $5.54                       780   \n",
       "\n",
       "  Total of All Purchases  \n",
       "0              $4,317.30  "
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# get the number of unique items\n",
    "\n",
    "\n",
    "# get the average price per item\n",
    "\n",
    "\n",
    "# get the number of purchases (count)\n",
    "\n",
    "\n",
    "# get the total of all items purchased (sum)\n",
    "\n",
    "\n",
    "# create the summary table\n",
    "\n",
    "\n",
    "# round the data in the summary table so that decimal amounts have 2 decimal places\n",
    "\n",
    "\n",
    "# format the Average Item Price to show the dollar sign and 2 decimal places\n",
    "\n",
    "\n",
    "# format the Total of All Purchases to show the dollar sign and 2 decimal places\n",
    "\n",
    "# display the summary table\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Customer Demographics"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* Percentage and Count of Child Customers\n",
    "\n",
    "* Percentage and Count of Teen Customers\n",
    "\n",
    "* Percentage and Count of Adult Customers\n",
    "\n",
    "* Percentage and Count of Senior Citizen Customers\n",
    "\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Total</th>\n",
       "      <th>% of Customers</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>Adult</th>\n",
       "      <td>370</td>\n",
       "      <td>64.24%</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Senior Citizen</th>\n",
       "      <td>118</td>\n",
       "      <td>20.49%</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Teen</th>\n",
       "      <td>61</td>\n",
       "      <td>10.59%</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Child</th>\n",
       "      <td>27</td>\n",
       "      <td>4.69%</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                Total % of Customers\n",
       "Adult             370         64.24%\n",
       "Senior Citizen    118         20.49%\n",
       "Teen               61         10.59%\n",
       "Child              27          4.69%"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# take the value counts of the Age groups ( think that there may be more than 1 purchase per customer ** drop the duplicates**)\n",
    "\n",
    "\n",
    "\n",
    "\n",
    "# calculate the percentages of the Age groups\n",
    "\n",
    "\n",
    "# create the customer demographics dataframe\n",
    "\n",
    "\n",
    "# round the decimal values to show 2 decimal places\n",
    "\n",
    "\n",
    "# display the DataFrame\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "\n",
    "## Purchasing Analysis (Age Group)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* Run basic calculations to obtain purchase count, avg. purchase price, avg. purchase total per person etc. by age group\n",
    "\n",
    "\n",
    "\n",
    "\n",
    "* Create a summary data frame to hold the results\n",
    "\n",
    "\n",
    "* Optional: give the displayed data cleaner formatting\n",
    "\n",
    "\n",
    "* Display the summary data frame"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Purchase Count</th>\n",
       "      <th>Avg Purchase Price</th>\n",
       "      <th>Total Purchase Amount</th>\n",
       "      <th>Avg Total Purchase Per Customer</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>Adult</th>\n",
       "      <td>494</td>\n",
       "      <td>$5.57</td>\n",
       "      <td>$2,749.45</td>\n",
       "      <td>$7.43</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Child</th>\n",
       "      <td>32</td>\n",
       "      <td>$5.09</td>\n",
       "      <td>$162.89</td>\n",
       "      <td>$6.03</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Senior Citizen</th>\n",
       "      <td>167</td>\n",
       "      <td>$5.40</td>\n",
       "      <td>$901.40</td>\n",
       "      <td>$7.64</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Teen</th>\n",
       "      <td>87</td>\n",
       "      <td>$5.79</td>\n",
       "      <td>$503.56</td>\n",
       "      <td>$8.26</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                Purchase Count Avg Purchase Price Total Purchase Amount  \\\n",
       "Adult                      494              $5.57             $2,749.45   \n",
       "Child                       32              $5.09               $162.89   \n",
       "Senior Citizen             167              $5.40               $901.40   \n",
       "Teen                        87              $5.79               $503.56   \n",
       "\n",
       "               Avg Total Purchase Per Customer  \n",
       "Adult                                    $7.43  \n",
       "Child                                    $6.03  \n",
       "Senior Citizen                           $7.64  \n",
       "Teen                                     $8.26  "
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# run basic calculations (USE GROUP BY!!!)\n",
    "# calculate the total counts of purchases by each Age Group\n",
    "\n",
    "# calculate the average amount per purchase per Age Group\n",
    "\n",
    "# calculate the total amounts of purchases per Age Group\n",
    "\n",
    "\n",
    "# Calculate the normalized purchasing (Average total per person in each age group) \n",
    "# HINT: use the totals from the customer demographics data frame above\n",
    "\n",
    "\n",
    "# create the data frame\n",
    "\n",
    "\n",
    "# format the data frame dollar columns\n",
    "\n",
    "\n",
    "# display the data frame\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Age Demographics"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* Establish bins for ages\n",
    "\n",
    "\n",
    "* Categorize the existing players using the age bins. Hint: use pd.cut()\n",
    "\n",
    "\n",
    "* Calculate the numbers and percentages by age group\n",
    "\n",
    "\n",
    "* Create a summary data frame to hold the results\n",
    "\n",
    "\n",
    "* Optional: round the percentage column to two decimal points\n",
    "\n",
    "\n",
    "* Display Age Demographics Table\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Total Count</th>\n",
       "      <th>Percentage of Customers</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>&lt;13</th>\n",
       "      <td>27</td>\n",
       "      <td>4.69%</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13-20</th>\n",
       "      <td>61</td>\n",
       "      <td>10.59%</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21-30</th>\n",
       "      <td>81</td>\n",
       "      <td>14.06%</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31-40</th>\n",
       "      <td>89</td>\n",
       "      <td>15.45%</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41-50</th>\n",
       "      <td>84</td>\n",
       "      <td>14.58%</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50-65</th>\n",
       "      <td>116</td>\n",
       "      <td>20.14%</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>65+</th>\n",
       "      <td>118</td>\n",
       "      <td>20.49%</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "       Total Count Percentage of Customers\n",
       "<13             27                   4.69%\n",
       "13-20           61                  10.59%\n",
       "21-30           81                  14.06%\n",
       "31-40           89                  15.45%\n",
       "41-50           84                  14.58%\n",
       "50-65          116                  20.14%\n",
       "65+            118                  20.49%"
      ]
     },
     "execution_count": 7,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# create the bins for the ages\n",
    "\n",
    "\n",
    "# use the age demo data frame to cut the ages into their bins and make a new data frame column\n",
    "\n",
    "\n",
    "# calculate the numbers and percentages by each age group\n",
    "\n",
    "# first, calculate the total count for each age group\n",
    "\n",
    "# calculate the percentages within each age group\n",
    "\n",
    "\n",
    "\n",
    "# build the dataframe\n",
    "\n",
    "\n",
    "\n",
    "# display the dataframe (sort the panda index)\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Purchasing Analysis (Age)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* Bin the purchase_data data frame by age\n",
    "\n",
    "\n",
    "* Run basic calculations to obtain purchase count, avg. purchase price, avg. purchase total per person etc. in the table below\n",
    "\n",
    "\n",
    "* Create a summary data frame to hold the results\n",
    "\n",
    "\n",
    "* Optional: give the displayed data cleaner formatting\n",
    "\n",
    "\n",
    "* Display the summary data frame"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Name</th>\n",
       "      <th>Age</th>\n",
       "      <th>AgeGroup</th>\n",
       "      <th>Item ID</th>\n",
       "      <th>Item Name</th>\n",
       "      <th>Item Price</th>\n",
       "      <th>Age Range</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>Junayd Pemberton</td>\n",
       "      <td>42</td>\n",
       "      <td>Adult</td>\n",
       "      <td>108</td>\n",
       "      <td>button</td>\n",
       "      <td>8.51</td>\n",
       "      <td>41-50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>Phebe Maguire</td>\n",
       "      <td>40</td>\n",
       "      <td>Adult</td>\n",
       "      <td>143</td>\n",
       "      <td>eraser</td>\n",
       "      <td>11.03</td>\n",
       "      <td>41-50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>Sara Shaffer</td>\n",
       "      <td>40</td>\n",
       "      <td>Adult</td>\n",
       "      <td>92</td>\n",
       "      <td>knife</td>\n",
       "      <td>0.20</td>\n",
       "      <td>41-50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>Cathy George</td>\n",
       "      <td>31</td>\n",
       "      <td>Adult</td>\n",
       "      <td>100</td>\n",
       "      <td>wallet</td>\n",
       "      <td>10.95</td>\n",
       "      <td>31-40</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>Haiden Schmidt</td>\n",
       "      <td>45</td>\n",
       "      <td>Adult</td>\n",
       "      <td>131</td>\n",
       "      <td>vase</td>\n",
       "      <td>4.85</td>\n",
       "      <td>41-50</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "               Name  Age AgeGroup  Item ID Item Name  Item Price Age Range\n",
       "0  Junayd Pemberton   42    Adult      108    button        8.51     41-50\n",
       "1     Phebe Maguire   40    Adult      143    eraser       11.03     41-50\n",
       "2      Sara Shaffer   40    Adult       92     knife        0.20     41-50\n",
       "3      Cathy George   31    Adult      100    wallet       10.95     31-40\n",
       "4    Haiden Schmidt   45    Adult      131      vase        4.85     41-50"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# bin the purchase_data data frame by age using the age bins\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Purchase Count</th>\n",
       "      <th>Avg Purchase Price</th>\n",
       "      <th>Total Purchase Amount</th>\n",
       "      <th>Avg Total Purchase Per Customer</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>&lt;13</th>\n",
       "      <td>32</td>\n",
       "      <td>$5.09</td>\n",
       "      <td>$162.89</td>\n",
       "      <td>$6.03</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13-20</th>\n",
       "      <td>87</td>\n",
       "      <td>$5.79</td>\n",
       "      <td>$503.56</td>\n",
       "      <td>$8.26</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21-30</th>\n",
       "      <td>111</td>\n",
       "      <td>$5.43</td>\n",
       "      <td>$602.96</td>\n",
       "      <td>$7.44</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31-40</th>\n",
       "      <td>113</td>\n",
       "      <td>$6.58</td>\n",
       "      <td>$743.13</td>\n",
       "      <td>$8.35</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41-50</th>\n",
       "      <td>110</td>\n",
       "      <td>$5.11</td>\n",
       "      <td>$561.55</td>\n",
       "      <td>$6.69</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50-65</th>\n",
       "      <td>160</td>\n",
       "      <td>$5.26</td>\n",
       "      <td>$841.81</td>\n",
       "      <td>$7.26</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>65+</th>\n",
       "      <td>167</td>\n",
       "      <td>$5.40</td>\n",
       "      <td>$901.40</td>\n",
       "      <td>$7.64</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "       Purchase Count Avg Purchase Price Total Purchase Amount  \\\n",
       "<13                32              $5.09               $162.89   \n",
       "13-20              87              $5.79               $503.56   \n",
       "21-30             111              $5.43               $602.96   \n",
       "31-40             113              $6.58               $743.13   \n",
       "41-50             110              $5.11               $561.55   \n",
       "50-65             160              $5.26               $841.81   \n",
       "65+               167              $5.40               $901.40   \n",
       "\n",
       "      Avg Total Purchase Per Customer  \n",
       "<13                             $6.03  \n",
       "13-20                           $8.26  \n",
       "21-30                           $7.44  \n",
       "31-40                           $8.35  \n",
       "41-50                           $6.69  \n",
       "50-65                           $7.26  \n",
       "65+                             $7.64  "
      ]
     },
     "execution_count": 9,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# run basic calculations (USE GROUP BY!!!)\n",
    "# calculate the total counts of purchases by each Age Range\n",
    "\n",
    "# calculate the average amount per purchase per Age Range\n",
    "\n",
    "# calculate the total amounts of purchases per Age Range\n",
    "\n",
    "\n",
    "# Calculate the normalized purchasing (Average total per person in each age group) \n",
    "# HINT: use the total count from the age demographics data frame from a few cells ago\n",
    "\n",
    "\n",
    "# create the data frame\n",
    "\n",
    "\n",
    "# format the data frame dollar columns\n",
    "\n",
    "\n",
    "# display the data frame\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Top Spending Customers"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* Run basic calculations to obtain the results in the table below\n",
    "\n",
    "\n",
    "* Create a summary data frame to hold the results\n",
    "\n",
    "\n",
    "* Sort the total purchase value column in descending order\n",
    "\n",
    "\n",
    "* Optional: give the displayed data cleaner formatting\n",
    "\n",
    "\n",
    "* Display a preview of the summary data frame\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Purchase Count</th>\n",
       "      <th>Avg Purchase Price</th>\n",
       "      <th>Total of all Purchases</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Name</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>Diesel England</th>\n",
       "      <td>3</td>\n",
       "      <td>$12.75</td>\n",
       "      <td>$38.25</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Ruby-May Monaghan</th>\n",
       "      <td>4</td>\n",
       "      <td>$9.03</td>\n",
       "      <td>$36.10</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Naomi John</th>\n",
       "      <td>5</td>\n",
       "      <td>$6.86</td>\n",
       "      <td>$34.31</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Callan Amos</th>\n",
       "      <td>3</td>\n",
       "      <td>$10.57</td>\n",
       "      <td>$31.72</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Kameron Collins</th>\n",
       "      <td>3</td>\n",
       "      <td>$10.01</td>\n",
       "      <td>$30.02</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                   Purchase Count Avg Purchase Price Total of all Purchases\n",
       "Name                                                                       \n",
       "Diesel England                  3             $12.75                 $38.25\n",
       "Ruby-May Monaghan               4              $9.03                 $36.10\n",
       "Naomi John                      5              $6.86                 $34.31\n",
       "Callan Amos                     3             $10.57                 $31.72\n",
       "Kameron Collins                 3             $10.01                 $30.02"
      ]
     },
     "execution_count": 10,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# identify the top spending customers (HINT: GROUP BY the name column)\n",
    "# calculate the purchase count\n",
    "\n",
    "# calculate the average price per user's purchase\n",
    "\n",
    "# calculate the total of all of the user's purchases\n",
    "\n",
    "\n",
    "# make a data frame\n",
    "\n",
    "\n",
    "# display the data frame and sort the values based on the total of all of the customers' purchases\n",
    "\n",
    "\n",
    "# format the data frame dollar columns\n",
    "\n",
    "\n",
    "# display the data frame\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Most Popular Items"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* Retrieve the Item ID, Item Name, and Item Price columns\n",
    "\n",
    "\n",
    "* Group by Item ID and Item Name. Perform calculations to obtain purchase count, average item price, and total purchase value\n",
    "\n",
    "\n",
    "* Create a summary data frame to hold the results\n",
    "\n",
    "\n",
    "* Sort the purchase count column in descending order\n",
    "\n",
    "\n",
    "* Optional: give the displayed data cleaner formatting\n",
    "\n",
    "\n",
    "* Display a preview of the summary data frame\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th># of Purchases</th>\n",
       "      <th>Item Price</th>\n",
       "      <th>Total Purchase Value</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Item ID</th>\n",
       "      <th>Item Name</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>92</th>\n",
       "      <th>knife</th>\n",
       "      <td>13</td>\n",
       "      <td>$7.84</td>\n",
       "      <td>$101.92</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>178</th>\n",
       "      <th>bowl</th>\n",
       "      <td>12</td>\n",
       "      <td>$4.98</td>\n",
       "      <td>$59.73</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>145</th>\n",
       "      <th>twezzers</th>\n",
       "      <td>9</td>\n",
       "      <td>$8.09</td>\n",
       "      <td>$72.80</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>132</th>\n",
       "      <th>cookie jar</th>\n",
       "      <td>9</td>\n",
       "      <td>$5.36</td>\n",
       "      <td>$48.28</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>108</th>\n",
       "      <th>button</th>\n",
       "      <td>9</td>\n",
       "      <td>$7.02</td>\n",
       "      <td>$63.17</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                    # of Purchases Item Price Total Purchase Value\n",
       "Item ID Item Name                                                 \n",
       "92      knife                   13      $7.84              $101.92\n",
       "178     bowl                    12      $4.98               $59.73\n",
       "145     twezzers                 9      $8.09               $72.80\n",
       "132     cookie jar               9      $5.36               $48.28\n",
       "108     button                   9      $7.02               $63.17"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Retrieve the Item ID, Item Name, and Item Price columns\n",
    "itemData = purchase_data.loc[:, [\"Item ID\", \"Item Name\", \"Item Price\"]]\n",
    "\n",
    "# Group by Item ID and Item Name. Perform calculations to obtain purchase count, average item price, and total purchase value\n",
    "itemCounts = itemData.groupby([\"Item ID\", \"Item Name\"]).count()[\"Item Price\"].rename(\"# of Purchases\")\n",
    "avgItemPrice = itemData.groupby([\"Item ID\", \"Item Name\"]).mean()[\"Item Price\"]\n",
    "totalItemPurchase = itemData.groupby([\"Item ID\", \"Item Name\"]).sum()[\"Item Price\"].rename(\"Total Purchase Value\")\n",
    "\n",
    "\n",
    "# create the data frame\n",
    "itemDF = pd.DataFrame({\n",
    "    \"# of Purchases\": itemCounts,\n",
    "    \"Item Price\": avgItemPrice,\n",
    "    \"Total Purchase Value\": totalItemPurchase\n",
    "})\n",
    "\n",
    "# sort the data frame by the number of purchases\n",
    "mostPopularItemDF = itemDF.sort_values(\"# of Purchases\", ascending=False)\n",
    "\n",
    "# format the data frame dollar columns\n",
    "mostPopularItemDF[\"Item Price\"] = mostPopularItemDF[\"Item Price\"].map(\"${:,.2f}\".format)\n",
    "mostPopularItemDF[\"Total Purchase Value\"] = mostPopularItemDF[\"Total Purchase Value\"].map(\"${:,.2f}\".format)\n",
    "\n",
    "# show the data frame\n",
    "mostPopularItemDF.head()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Most Profitable Items"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* Sort the above table by total purchase value in descending order\n",
    "\n",
    "\n",
    "* Optional: give the displayed data cleaner formatting\n",
    "\n",
    "\n",
    "* Display a preview of the data frame\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th># of Purchases</th>\n",
       "      <th>Item Price</th>\n",
       "      <th>Total Purchase Value</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Item ID</th>\n",
       "      <th>Item Name</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>92</th>\n",
       "      <th>knife</th>\n",
       "      <td>13</td>\n",
       "      <td>$7.84</td>\n",
       "      <td>$101.92</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>145</th>\n",
       "      <th>twezzers</th>\n",
       "      <td>9</td>\n",
       "      <td>$8.09</td>\n",
       "      <td>$72.80</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>108</th>\n",
       "      <th>button</th>\n",
       "      <td>9</td>\n",
       "      <td>$7.02</td>\n",
       "      <td>$63.17</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <th>door</th>\n",
       "      <td>7</td>\n",
       "      <td>$8.89</td>\n",
       "      <td>$62.21</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>178</th>\n",
       "      <th>bowl</th>\n",
       "      <td>12</td>\n",
       "      <td>$4.98</td>\n",
       "      <td>$59.73</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                   # of Purchases Item Price Total Purchase Value\n",
       "Item ID Item Name                                                \n",
       "92      knife                  13      $7.84              $101.92\n",
       "145     twezzers                9      $8.09               $72.80\n",
       "108     button                  9      $7.02               $63.17\n",
       "7       door                    7      $8.89               $62.21\n",
       "178     bowl                   12      $4.98               $59.73"
      ]
     },
     "execution_count": 12,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Sort the above table by total purchase value in descending order\n",
    "mostProfitableItemDF = itemDF.sort_values(\"Total Purchase Value\", ascending=False)\n",
    "\n",
    "# format the data frame dollar columns\n",
    "mostProfitableItemDF[\"Item Price\"] = mostProfitableItemDF[\"Item Price\"].map(\"${:,.2f}\".format)\n",
    "mostProfitableItemDF[\"Total Purchase Value\"] = mostProfitableItemDF[\"Total Purchase Value\"].map(\"${:,.2f}\".format)\n",
    "\n",
    "mostProfitableItemDF.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "anaconda-cloud": {},
  "kernel_info": {
   "name": "python3"
  },
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.8"
  },
  "latex_envs": {
   "LaTeX_envs_menu_present": true,
   "autoclose": false,
   "autocomplete": true,
   "bibliofile": "biblio.bib",
   "cite_by": "apalike",
   "current_citInitial": 1,
   "eqLabelWithNumbers": true,
   "eqNumInitial": 1,
   "hotkeys": {
    "equation": "Ctrl-E",
    "itemize": "Ctrl-I"
   },
   "labels_anchors": false,
   "latex_user_defs": false,
   "report_style_numbering": false,
   "user_envs_cfg": false
  },
  "nteract": {
   "version": "0.2.0"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}